<html xmlns:v="urn:schemas-microsoft-com:vml"
xmlns:o="urn:schemas-microsoft-com:office:office"
xmlns:w="urn:schemas-microsoft-com:office:word"
xmlns:dt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882"
xmlns:m="http://schemas.microsoft.com/office/2004/12/omml"
xmlns="http://www.w3.org/TR/REC-html40" xmlns:ns0="http://macVmlSchemaUri">

<head>
<meta http-equiv=Content-Type content="text/html; charset=unicode">
<meta name=ProgId content=Word.Document>
<meta name=Generator content="Microsoft Word 12">
<meta name=Originator content="Microsoft Word 12">
<link rel=File-List href="index_files/filelist.xml">
<link rel=Edit-Time-Data href="index_files/editdata.mso">
<!--[if !mso]>
<style>
v\:* {behavior:url(#default#VML);}
o\:* {behavior:url(#default#VML);}
w\:* {behavior:url(#default#VML);}
.shape {behavior:url(#default#VML);}
</style>
<![endif]-->
<title>StuTue-GeneiusVis-MC3</title>
<!--[if gte mso 9]><xml>
 <o:DocumentProperties>
  <o:Author>Kay Nieselt</o:Author>
  <o:Template>Normal</o:Template>
  <o:LastAuthor>Julian Heinrich</o:LastAuthor>
  <o:Revision>40</o:Revision>
  <o:LastPrinted>2010-06-29T12:07:00Z</o:LastPrinted>
  <o:Created>2010-06-29T16:02:00Z</o:Created>
  <o:LastSaved>2010-06-29T20:31:00Z</o:LastSaved>
  <o:Pages>5</o:Pages>
  <o:Words>2281</o:Words>
  <o:Characters>12228</o:Characters>
  <o:Company>Visualisierungsinstitut der Universität Stuttgart</o:Company>
  <o:Lines>291</o:Lines>
  <o:Paragraphs>75</o:Paragraphs>
  <o:CharactersWithSpaces>14434</o:CharactersWithSpaces>
  <o:Version>12.00</o:Version>
 </o:DocumentProperties>
 <o:CustomDocumentProperties>
  <o:_DocHome dt:dt="float">94053087</o:_DocHome>
 </o:CustomDocumentProperties>
 <o:OfficeDocumentSettings>
  <o:AllowPNG/>
 </o:OfficeDocumentSettings>
</xml><![endif]-->
<link rel=themeData href="index_files/themedata.thmx">
<link rel=colorSchemeMapping href="index_files/colorschememapping.xml">
<!--[if gte mso 9]><xml>
 <w:WordDocument>
  <w:Zoom>125</w:Zoom>
  <w:TrackMoves>false</w:TrackMoves>
  <w:TrackFormatting/>
  <w:HyphenationZone>21</w:HyphenationZone>
  <w:DisplayHorizontalDrawingGridEvery>0</w:DisplayHorizontalDrawingGridEvery>
  <w:DisplayVerticalDrawingGridEvery>0</w:DisplayVerticalDrawingGridEvery>
  <w:UseMarginsForDrawingGridOrigin/>
  <w:ValidateAgainstSchemas/>
  <w:SaveIfXMLInvalid>false</w:SaveIfXMLInvalid>
  <w:IgnoreMixedContent>false</w:IgnoreMixedContent>
  <w:AlwaysShowPlaceholderText>false</w:AlwaysShowPlaceholderText>
  <w:DoNotPromoteQF/>
  <w:LidThemeOther>DE</w:LidThemeOther>
  <w:LidThemeAsian>X-NONE</w:LidThemeAsian>
  <w:LidThemeComplexScript>X-NONE</w:LidThemeComplexScript>
  <w:Compatibility>
   <w:BreakWrappedTables/>
   <w:SnapToGridInCell/>
   <w:WrapTextWithPunct/>
   <w:UseAsianBreakRules/>
   <w:DontGrowAutofit/>
   <w:SplitPgBreakAndParaMark/>
   <w:DontVertAlignCellWithSp/>
   <w:DontBreakConstrainedForcedTables/>
   <w:DontVertAlignInTxbx/>
   <w:Word11KerningPairs/>
   <w:CachedColBalance/>
  </w:Compatibility>
  <w:BrowserLevel>MicrosoftInternetExplorer4</w:BrowserLevel>
  <m:mathPr>
   <m:mathFont m:val="Cambria Math"/>
   <m:brkBin m:val="before"/>
   <m:brkBinSub m:val="--"/>
   <m:smallFrac m:val="off"/>
   <m:dispDef/>
   <m:lMargin m:val="0"/>
   <m:rMargin m:val="0"/>
   <m:defJc m:val="centerGroup"/>
   <m:wrapIndent m:val="1440"/>
   <m:intLim m:val="subSup"/>
   <m:naryLim m:val="undOvr"/>
  </m:mathPr></w:WordDocument>
</xml><![endif]--><!--[if gte mso 9]><xml>
 <w:LatentStyles DefLockedState="false" DefUnhideWhenUsed="false"
  DefSemiHidden="false" DefQFormat="false" LatentStyleCount="267">
  <w:LsdException Locked="false" QFormat="true" Name="Normal"/>
  <w:LsdException Locked="false" QFormat="true" Name="heading 1"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 4"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 5"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 6"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 7"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 8"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 9"/>
  <w:LsdException Locked="false" QFormat="true" Name="caption"/>
  <w:LsdException Locked="false" QFormat="true" Name="Title"/>
  <w:LsdException Locked="false" Priority="1" Name="Default Paragraph Font"/>
  <w:LsdException Locked="false" QFormat="true" Name="Subtitle"/>
  <w:LsdException Locked="false" QFormat="true" Name="Strong"/>
  <w:LsdException Locked="false" QFormat="true" Name="Emphasis"/>
  <w:LsdException Locked="false" Priority="99" Name="No List"/>
  <w:LsdException Locked="false" QFormat="true" Name="No Spacing"/>
  <w:LsdException Locked="false" QFormat="true" Name="List Paragraph"/>
  <w:LsdException Locked="false" QFormat="true" Name="Quote"/>
  <w:LsdException Locked="false" QFormat="true" Name="Intense Quote"/>
  <w:LsdException Locked="false" QFormat="true" Name="Subtle Emphasis"/>
  <w:LsdException Locked="false" QFormat="true" Name="Intense Emphasis"/>
  <w:LsdException Locked="false" QFormat="true" Name="Subtle Reference"/>
  <w:LsdException Locked="false" QFormat="true" Name="Intense Reference"/>
  <w:LsdException Locked="false" QFormat="true" Name="Book Title"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="TOC Heading"/>
 </w:LatentStyles>
</xml><![endif]-->
<style>
<!--
 /* Font Definitions */
 @font-face
	{font-family:Helvetica;
	panose-1:2 11 6 4 2 2 2 2 2 4;
	mso-font-charset:0;
	mso-generic-font-family:swiss;
	mso-font-pitch:variable;
	mso-font-signature:-536859905 -1073711037 9 0 511 0;}
@font-face
	{font-family:"Cambria Math";
	panose-1:0 0 0 0 0 0 0 0 0 0;
	mso-font-charset:1;
	mso-generic-font-family:roman;
	mso-font-format:other;
	mso-font-pitch:variable;
	mso-font-signature:0 0 0 0 0 0;}
@font-face
	{font-family:Tahoma;
	panose-1:2 11 6 4 3 5 4 4 2 4;
	mso-font-charset:0;
	mso-generic-font-family:swiss;
	mso-font-pitch:variable;
	mso-font-signature:-520081665 -1073717157 41 0 66047 0;}
 /* Style Definitions */
 p.MsoNormal, li.MsoNormal, div.MsoNormal
	{mso-style-unhide:no;
	mso-style-qformat:yes;
	mso-style-parent:"";
	margin:0cm;
	margin-bottom:.0001pt;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Times New Roman","serif";
	mso-fareast-font-family:"Times New Roman";
	mso-fareast-theme-font:minor-fareast;
	mso-bidi-font-family:"Times New Roman";
	mso-bidi-theme-font:minor-bidi;}
p.MsoCaption, li.MsoCaption, div.MsoCaption
	{mso-style-unhide:no;
	mso-style-qformat:yes;
	mso-style-next:Normal;
	margin:0cm;
	margin-bottom:.0001pt;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Times New Roman","serif";
	mso-fareast-font-family:"Times New Roman";
	mso-fareast-theme-font:minor-fareast;
	mso-bidi-font-family:"Times New Roman";
	mso-bidi-theme-font:minor-bidi;
	font-weight:bold;}
a:link, span.MsoHyperlink
	{mso-style-unhide:no;
	color:blue;
	text-decoration:underline;
	text-underline:single;}
a:visited, span.MsoHyperlinkFollowed
	{mso-style-unhide:no;
	color:purple;
	text-decoration:underline;
	text-underline:single;}
p.MsoAcetate, li.MsoAcetate, div.MsoAcetate
	{mso-style-unhide:no;
	mso-style-link:"Sprechblasentext Zchn";
	margin:0cm;
	margin-bottom:.0001pt;
	mso-pagination:widow-orphan;
	font-size:8.0pt;
	font-family:"Tahoma","sans-serif";
	mso-fareast-font-family:"Times New Roman";
	mso-fareast-theme-font:minor-fareast;}
p.Normal, li.Normal, div.Normal
	{mso-style-name:Normal;
	mso-style-unhide:no;
	margin:0cm;
	margin-bottom:.0001pt;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Times New Roman","serif";
	mso-fareast-font-family:"Times New Roman";
	mso-fareast-theme-font:minor-fareast;
	mso-bidi-font-family:"Times New Roman";
	mso-bidi-theme-font:minor-bidi;}
span.SprechblasentextZchn
	{mso-style-name:"Sprechblasentext Zchn";
	mso-style-unhide:no;
	mso-style-locked:yes;
	mso-style-link:Sprechblasentext;
	mso-ansi-font-size:8.0pt;
	mso-bidi-font-size:8.0pt;
	font-family:"Tahoma","sans-serif";
	mso-ascii-font-family:Tahoma;
	mso-fareast-font-family:"Times New Roman";
	mso-fareast-theme-font:minor-fareast;
	mso-hansi-font-family:Tahoma;
	mso-bidi-font-family:Tahoma;}
p.BalloonText, li.BalloonText, div.BalloonText
	{mso-style-name:"Balloon Text";
	mso-style-unhide:no;
	mso-style-link:"Balloon Text Char";
	margin:0cm;
	margin-bottom:.0001pt;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Times New Roman","serif";
	mso-fareast-font-family:"Times New Roman";
	mso-fareast-theme-font:minor-fareast;
	mso-bidi-font-family:"Times New Roman";
	mso-bidi-theme-font:minor-bidi;}
span.BalloonTextChar
	{mso-style-name:"Balloon Text Char";
	mso-style-unhide:no;
	mso-style-locked:yes;
	mso-style-link:"Balloon Text";
	mso-ansi-font-size:8.0pt;
	mso-bidi-font-size:8.0pt;
	font-family:"Tahoma","sans-serif";
	mso-ascii-font-family:Tahoma;
	mso-fareast-font-family:"Times New Roman";
	mso-fareast-theme-font:minor-fareast;
	mso-hansi-font-family:Tahoma;
	mso-bidi-font-family:Tahoma;}
.MsoChpDefault
	{mso-style-type:export-only;
	mso-default-props:yes;
	font-size:10.0pt;
	mso-ansi-font-size:10.0pt;
	mso-bidi-font-size:10.0pt;}
@page Section1
	{size:595.0pt 842.0pt;
	margin:72.0pt 90.0pt 72.0pt 90.0pt;
	mso-header-margin:35.4pt;
	mso-footer-margin:35.4pt;
	mso-paper-source:0;}
div.Section1
	{page:Section1;}
-->
</style>
<!--[if gte mso 10]>
<style>
 /* Style Definitions */
 table.MsoNormalTable
	{mso-style-name:"Normale Tabelle";
	mso-tstyle-rowband-size:0;
	mso-tstyle-colband-size:0;
	mso-style-noshow:yes;
	mso-style-priority:99;
	mso-style-qformat:yes;
	mso-style-parent:"";
	mso-padding-alt:0cm 5.4pt 0cm 5.4pt;
	mso-para-margin:0cm;
	mso-para-margin-bottom:.0001pt;
	mso-pagination:widow-orphan;
	font-size:10.0pt;
	font-family:"Times New Roman","serif";}
table.TableNormal
	{mso-style-name:"Table Normal";
	mso-tstyle-rowband-size:0;
	mso-tstyle-colband-size:0;
	mso-style-noshow:yes;
	mso-style-priority:99;
	mso-style-unhide:no;
	mso-style-qformat:yes;
	mso-style-parent:"";
	mso-padding-alt:0cm 5.4pt 0cm 5.4pt;
	mso-para-margin:0cm;
	mso-para-margin-bottom:.0001pt;
	mso-pagination:widow-orphan;
	font-size:10.0pt;
	font-family:"Times New Roman","serif";}
</style>
<![endif]-->
<meta name=Title content=StuTue-GeneiusVis-MC3>
<meta name=Keywords content="">
<!--[if gte mso 9]><xml>
 <o:shapedefaults v:ext="edit" spidmax="5122" style='mso-position-horizontal:right'
  o:allowoverlap="f" fill="f" stroke="f">
  <v:fill on="f"/>
  <v:stroke on="f"/>
 </o:shapedefaults></xml><![endif]--><!--[if gte mso 9]><xml>
 <o:shapelayout v:ext="edit">
  <o:idmap v:ext="edit" data="1"/>
 </o:shapelayout></xml><![endif]-->
</head>

<body bgcolor=white lang=DE link=blue vlink=purple style='tab-interval:36.0pt'>

<div class=Section1>

<p class=MsoNormal align=center style='text-align:center'><b style='mso-bidi-font-weight:
normal'><span style='font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman"'>&quot;Team Stuttgart and Tübingen – GeneiusVis&quot;<o:p></o:p></span></b></p>

<p class=MsoNormal align=center style='text-align:center'><b style='mso-bidi-font-weight:
normal'><span style='font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman"'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoNormal align=center style='text-align:center'><b style='mso-bidi-font-weight:
normal'><span lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>VAST 2010 Challenge<o:p></o:p></span></b></p>

<p class=MsoNormal align=center style='text-align:center'><b style='mso-bidi-font-weight:
normal'><u><span lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>Genetic Sequences - Tracing the
Mutations of a Disease<o:p></o:p></span></u></b></p>

<p class=MsoNormal><span lang=EN-US style='mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><span lang=EN-US style='mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Authors and Affiliations:<o:p></o:p></span></b></p>

<p class=MsoNormal style='margin-left:24.0pt;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'><i style='mso-bidi-font-style:normal'><span
lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Julian Heinrich, University of Stuttgart, <a
href="mailto:julian.heinrich@visus.uni-stuttgart.de">julian.heinrich@visus.uni-stuttgart.de</a><o:p></o:p></span></i></p>

<p class=MsoNormal style='margin-left:24.0pt;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'><i style='mso-bidi-font-style:normal'><span
lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Andre Burkovski, University of Stuttgart, <a
href="mailto:andre.burkovski@visus.uni-stuttgart.de">andre.burkovski@visus.uni-stuttgart.de</a><o:p></o:p></span></i></p>

<p class=MsoNormal style='margin-left:24.0pt;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'><i style='mso-bidi-font-style:normal'><span
lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Florian Battke, University of Tübingen, <a
href="mailto:florian.battke@uni-tuebingen.de">florian.battke@uni-tuebingen.de</a>s<o:p></o:p></span></i></p>

<p class=MsoNormal style='margin-left:24.0pt;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'><i style='mso-bidi-font-style:normal'><span
lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Alexander Herbig, University of Tübingen, <a
href="mailto:alexander.herbig@uni-tuebingen.de">alexander.herbig@uni-tuebingen.de</a><o:p></o:p></span></i></p>

<p class=MsoNormal style='margin-left:24.0pt;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'><i style='mso-bidi-font-style:normal'><span
lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Stephan Symons, University of Tübingen, <a
href="mailto:symons@informatik.uni-tuebingen.de">symons@informatik.uni-tuebingen.de</a><o:p></o:p></span></i></p>

<p class=MsoNormal style='margin-left:24.0pt;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'><i style='mso-bidi-font-style:normal'><span
lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Kay Nieselt, University of Tübingen, <a
href="mailto:kay.nieselt@uni-tuebingen.de">kay.nieselt@uni-tuebingen.de</a></span></i><span
lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p></o:p></span></p>

<p class=MsoNormal><span lang=EN-US style='font-family:"Arial","sans-serif";
mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Tool(s):<o:p></o:p></span></b></p>

<p class=MsoNormal style='margin-left:24.0pt;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'><i style='mso-bidi-font-style:normal'><span
lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>In order to solve this mini challenge a visual
analytics tool was developed, integrating the result of calculating a
phylogenetic tree using the neighbor joining method. For the computation of the
phylogenetic trees, <a href="http://www.clustal.org/">ClustalX</a> was used.
ClustalX is a multiple sequence alignment program, however the alignment
procedures were not used since the sequences for the challenge were already
aligned. The phylogenetic tree was exported as a Newick file, a standard file
format used in phylogenetics. The developed tool ‘GeneiusVis’, consists of two
linked views: a Tree Visualizer offering different layouters for phylogenetic
trees as well as interactive node and edge selection, and an alignment viewer
for multiple sequence alignments allowing to trace mutations of a disease.
Selections of rows in the alignment viewer are linked to the respective nodes
in the Tree Visualizer and vice versa. The alignment viewer provides
interactive computation of consensus sequences from selected rows. The consensus
sequence represents the most frequent nucleotide at each position of the
selected sequences.<o:p></o:p></span></i></p>

<p class=MsoNormal style='margin-left:24.0pt;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'><i style='mso-bidi-font-style:normal'><span
lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Additionally, <a href="http://www.r-project.org/">R</a>
was used to compute the mutual information of pairs of columns in a multiple
sequence alignment, as well as to determine the mean evolutionary divergence
between two groups of sequences. Finally, the <a
href="http://www.cs.waikato.ac.nz/ml/weka/">WEKA</a> library was used to
validate the findings.<o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span lang=EN-US style='font-family:"Arial","sans-serif";
mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><i
style='mso-bidi-font-style:normal'><span lang=EN-US style='font-family:"Arial","sans-serif";
mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'>Video:</span></i></b><span
lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span lang=EN-US style='font-family:"Arial","sans-serif";
mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><a href="index_files/MC3.html">Video</a></span></i><span
lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p></o:p></span></p>

<p class=MsoNormal><span lang=EN-US style='font-family:"Arial","sans-serif";
mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><span lang=EN-US style='font-family:"Arial","sans-serif";
mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>ANSWERS:<o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></b></p>

<div class=MsoNormal align=center style='text-align:center;mso-pagination:none;
mso-layout-grid-align:none;text-autospace:none'><b style='mso-bidi-font-weight:
normal'><span lang=EN-US style='font-family:"Arial","sans-serif";mso-ansi-language:
EN-US'>

<hr size=2 width="100%" align=center>

</span></b></div>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>MC3.1: What is the region or country of origin for the
current outbreak?&nbsp; </span></b><span lang=EN-US style='font-family:"Arial","sans-serif";
mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'><o:p></o:p></span></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Answer: Nigeria_B<o:p></o:p></span></b></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoNormal><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>To determine the origin of the virus associated with an
outbreak of the Drafa virus, we conducted genetic analyses of all native
sequences and those of the current disease outbreak. Phylogenetic analyses
based on the nucleotide sequences showed that all viral sequences from the
disease outbreak are very closely related and cluster monophyletically. This
proves that all strains from the current outbreak have one common ancestor, the
strain from Nigeria B (highlighted red in Figure 1). The same answer is found
when using amino acid sequences. In addition, we computed the average
nucleotide divergence between the current Drafa viruses and the native strain
sequences, using R. The minimum is 0.010799 which again is the divergence to
Nigeria B.<o:p></o:p></span></i></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'><span
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-no-proof:yes'><!--[if gte vml 1]><v:shapetype id="_x0000_t75" coordsize="21600,21600"
 o:spt="75" o:preferrelative="t" path="m@4@5l@4@11@9@11@9@5xe" filled="f"
 stroked="f">
 <v:stroke joinstyle="miter"/>
 <v:formulas>
  <v:f eqn="if lineDrawn pixelLineWidth 0"/>
  <v:f eqn="sum @0 1 0"/>
  <v:f eqn="sum 0 0 @1"/>
  <v:f eqn="prod @2 1 2"/>
  <v:f eqn="prod @3 21600 pixelWidth"/>
  <v:f eqn="prod @3 21600 pixelHeight"/>
  <v:f eqn="sum @0 0 1"/>
  <v:f eqn="prod @6 1 2"/>
  <v:f eqn="prod @7 21600 pixelWidth"/>
  <v:f eqn="sum @8 21600 0"/>
  <v:f eqn="prod @7 21600 pixelHeight"/>
  <v:f eqn="sum @10 21600 0"/>
 </v:formulas>
 <v:path o:extrusionok="f" gradientshapeok="t" o:connecttype="rect"/>
 <o:lock v:ext="edit" aspectratio="t"/>
</v:shapetype><v:shape id="Picture_x0020_2" o:spid="_x0000_i1038" type="#_x0000_t75"
 alt="FullTree" style='width:890.25pt;height:542.25pt;visibility:visible;
 mso-wrap-style:square'>
 <v:imagedata src="index_files/image001.jpg" o:title="FullTree"/>
</v:shape><![endif]--><![if !vml]><img border=0 width=1187 height=723
src="index_files/image002.jpg" alt=FullTree v:shapes="Picture_x0020_2"><![endif]></span></b><b
style='mso-bidi-font-weight:normal'><span lang=EN-US style='font-family:"Arial","sans-serif";
mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'><o:p></o:p></span></b></p>

<p class=MsoCaption><span lang=EN-US style='mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Figure </span><!--[if supportFields]><span lang=EN-US
style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'><span
style='mso-element:field-begin'></span><span
style='mso-spacerun:yes'> </span>SEQ Figure \* ARABIC <span style='mso-element:
field-separator'></span></span><![endif]--><span lang=EN-US style='mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>1</span><!--[if supportFields]><span
lang=EN-US style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US'><span style='mso-element:field-end'></span></span><![endif]--><span
lang=EN-US style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US'>: A phylogenetic tree of all sequences in the Tree Visualizer. The
native strain sharing the lowest common ancestor with all strains of the
current outbreak is highlighted in red.<o:p></o:p></span></p>

<p class=MsoNormal><span lang=EN-US style='mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<div class=MsoNormal align=center style='text-align:center;mso-pagination:none;
mso-layout-grid-align:none;text-autospace:none'><b style='mso-bidi-font-weight:
normal'><span lang=EN-US style='font-family:"Arial","sans-serif";mso-ansi-language:
EN-US'>

<hr size=2 width="100%" align=center>

</span></b></div>

<p class=MsoNormal><span lang=EN-US style='font-size:14.0pt;font-family:"Helvetica","sans-serif";
mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>MC3.2: Over time, the virus spreads and the diversity
of the virus increases as it mutates. Two patients infected with the Drafa virus
are in the same hospital as Nicolai. Nicolai has a strain identified by
sequence 583. One patient has a strain identified by sequence 123 and the other
has a strain identified by sequence 51. Assume only a single viral strain is in
each patient. Which patient likely contracted the illness from Nicolai and why?<o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Answer: ID 123<o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>After performing a phylogenetic analysis of the
nucleotide sequences restricted to the sequences of the current disease
outbreak we imported the resulting tree in the Tree Visualizer. The Alignment
Viewer can be used to sort and select IDs more efficiently. The corresponding
nodes are simultaneously selected and highlighted in the tree. We selected the
three IDs with label 583, 123 and 51, and interactively labeled them with red.
From the tree, it is evident that 123 is much closer to 583 than the sequence
with ID 51. This is validated by the evolutionary divergence of 583 and 123
which is 0.000713, while the evolutionary divergence of 583 and 51 is 0.002141.
The same answer is found when using amino acid sequences.<o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></b></p>

<table class=TableNormal border=1 cellspacing=0 cellpadding=0 style='border-collapse:
 collapse;border:none;mso-border-alt:solid windowtext .5pt;mso-yfti-tbllook:
 1184;mso-padding-alt:0cm 5.4pt 0cm 5.4pt'>
 <tr style='mso-yfti-irow:0;mso-yfti-firstrow:yes;mso-yfti-lastrow:yes'>
  <td width=284 valign=top style='width:212.9pt;border:solid windowtext 1.0pt;
  mso-border-alt:solid windowtext .5pt;padding:0cm 5.4pt 0cm 5.4pt'>
  <p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
  text-autospace:none'><b style='mso-bidi-font-weight:normal'><span
  style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
  "Times New Roman";mso-no-proof:yes'><!--[if gte vml 1]><v:shape id="Picture_x0020_4"
   o:spid="_x0000_i1037" type="#_x0000_t75" alt="DiseaseTree" style='width:8in;
   height:348pt;visibility:visible;mso-wrap-style:square'>
   <v:imagedata src="index_files/image003.jpg" o:title="DiseaseTree"/>
  </v:shape><![endif]--><![if !vml]><img border=0 width=768 height=464
  src="index_files/image004.jpg" alt=DiseaseTree v:shapes="Picture_x0020_4"><![endif]></span></b><b
  style='mso-bidi-font-weight:normal'><span style='font-size:13.0pt;font-family:
  "Arial","sans-serif";mso-bidi-font-family:"Times New Roman"'><o:p></o:p></span></b></p>
  </td>
  <td width=284 valign=top style='width:212.9pt;border:solid windowtext 1.0pt;
  border-left:none;mso-border-left-alt:solid windowtext .5pt;mso-border-alt:
  solid windowtext .5pt;padding:0cm 5.4pt 0cm 5.4pt'>
  <p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
  text-autospace:none'><b style='mso-bidi-font-weight:normal'><span
  style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
  "Times New Roman";mso-no-proof:yes'><!--[if gte vml 1]><v:shape id="Picture_x0020_5"
   o:spid="_x0000_i1036" type="#_x0000_t75" alt="mc3" style='width:353.25pt;
   height:284.25pt;visibility:visible;mso-wrap-style:square'>
   <v:imagedata src="index_files/image005.png" o:title="mc3"/>
  </v:shape><![endif]--><![if !vml]><img border=0 width=471 height=379
  src="index_files/image006.png" alt=mc3 v:shapes="Picture_x0020_5"><![endif]></span></b><b
  style='mso-bidi-font-weight:normal'><span style='font-size:13.0pt;font-family:
  "Arial","sans-serif";mso-bidi-font-family:"Times New Roman"'><o:p></o:p></span></b></p>
  </td>
 </tr>
</table>

<p class=MsoCaption><span lang=EN-US style='mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Figure </span><!--[if supportFields]><span lang=EN-US
style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'><span
style='mso-element:field-begin'></span><span
style='mso-spacerun:yes'> </span>SEQ Figure \* ARABIC <span style='mso-element:
field-separator'></span></span><![endif]--><span lang=EN-US style='mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>2</span><!--[if supportFields]><span
lang=EN-US style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US'><span style='mso-element:field-end'></span></span><![endif]--><span
lang=EN-US style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US'>: Phylogenetic tree and alignment of all current outbreak sequences.
Selection of strains in the alignment viewer automatically highlights the respective
nodes in the tree. </span><span lang=EN-US style='font-size:14.0pt;font-family:
"Helvetica","sans-serif";mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US;font-weight:normal'><o:p></o:p></span></p>

<p class=MsoCaption><span lang=EN-US style='font-size:13.0pt;font-family:"Arial","sans-serif";
mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<div class=MsoNormal align=center style='text-align:center;mso-pagination:none;
mso-layout-grid-align:none;text-autospace:none'><b style='mso-bidi-font-weight:
normal'><span lang=EN-US style='font-family:"Arial","sans-serif";mso-ansi-language:
EN-US'>

<hr size=2 width="100%" align=center>

</span></b></div>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>MC3.3: Signs and symptoms of the
Drafa virus are varied and humans react differently to infection. Some mutant
strains from the current outbreak have been reported as being worse than others
for the patients that come in contact with them.</span></b><span lang=EN-US
style='font-size:16.0pt;mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US'><o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>Identify the top 3 mutations that
lead to an increase in symptom severity (a disease characteristic). The
mutations involve one or more base substitutions. For this question, the
biological properties of the underlying amino acid sequence patterns are not
significant in determining disease characteristics.</span></b><span lang=EN-US
style='font-size:16.0pt;mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US'><o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>For each mutation provide the base
substitutions and their position in the sequence (left to right) where the base
substitutions occurred. For example,</span></b><span lang=EN-US
style='font-size:16.0pt;mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US'><o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>C -&gt; G, 456 (C changed to G at
position 456)</span></b><span lang=EN-US style='font-size:16.0pt;mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'><o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>G -&gt; A, 513 and T -&gt; A, 907 (G
changed to A at position 513 and T changed to A at position 907)</span></b><span
lang=EN-US style='font-size:16.0pt;mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>A -&gt; G, 39 (A changed to G at
position 39)<o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span lang=EN-US style='font-size:16.0pt;mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Answer: <o:p></o:p></span></b></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>A </span></b><b style='mso-bidi-font-weight:normal'><span
lang=EN-US style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>-&gt;</span></b><b style='mso-bidi-font-weight:
normal'><span lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'> G, 223<o:p></o:p></span></b></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>A </span></b><b style='mso-bidi-font-weight:normal'><span
lang=EN-US style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>-&gt;</span></b><b style='mso-bidi-font-weight:
normal'><span lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'> C, 269<o:p></o:p></span></b></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>T </span></b><b style='mso-bidi-font-weight:normal'><span
lang=EN-US style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>-&gt;</span></b><b style='mso-bidi-font-weight:
normal'><span lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'> C, 109<o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>For all following tasks, nucleotides and disease
characteristics (with increasing severity from 0 to 2) have been mapped to
colors and opacity. <o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;page-break-after:avoid;
mso-layout-grid-align:none;text-autospace:none'><i style='mso-bidi-font-style:
normal'><span style='font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-no-proof:yes'><!--[if gte vml 1]><v:shape id="Picture_x0020_7"
 o:spid="_x0000_i1035" type="#_x0000_t75" alt="mc3" style='width:350.25pt;
 height:695.25pt;visibility:visible;mso-wrap-style:square'>
 <v:imagedata src="index_files/image007.png" o:title="mc3"/>
</v:shape><![endif]--><![if !vml]><img border=0 width=467 height=927
src="index_files/image008.png" alt=mc3 v:shapes="Picture_x0020_7"><![endif]></span></i><span
lang=EN-US style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US'><o:p></o:p></span></p>

<p class=MsoCaption><span lang=EN-US style='mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Figure </span><!--[if supportFields]><span lang=EN-US
style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'><span
style='mso-element:field-begin'></span><span
style='mso-spacerun:yes'> </span>SEQ Figure \* ARABIC <span style='mso-element:
field-separator'></span></span><![endif]--><span lang=EN-US style='mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>3</span><!--[if supportFields]><span
lang=EN-US style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US'><span style='mso-element:field-end'></span></span><![endif]--><span
lang=EN-US style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US'>: Alignment Viewer with disease characteristics.<o:p></o:p></span></p>

<p class=MsoNormal><span lang=EN-US style='mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>We sorted all sequences by symptom severity and
computed the consensus sequence for every severity group. The color of the
consensus nucleotide corresponds to the most frequent one of the group while
opacity reflects its relative frequency and thereby the degree of conservation
in the respective group. The most prominent correlation of columns with the opacity
of symptom severity occur in columns 22, 79, 109, 161, 223, 269, 842 and 946. As
positions 22, 79, 161, 842 and 946 turn out to be correlated with other disease
characteristics (see below), only 109, 223 and 269 remain.<o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;page-break-after:avoid;
mso-layout-grid-align:none;text-autospace:none'><i style='mso-bidi-font-style:
normal'><span style='font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-no-proof:yes'><!--[if gte vml 1]><v:shape id="Picture_x0020_8"
 o:spid="_x0000_i1034" type="#_x0000_t75" alt="mc3" style='width:549.75pt;
 height:107.25pt;visibility:visible;mso-wrap-style:square'>
 <v:imagedata src="index_files/image009.png" o:title="mc3"/>
</v:shape><![endif]--><![if !vml]><img border=0 width=733 height=143
src="index_files/image009.png" alt=mc3 v:shapes="Picture_x0020_8"><![endif]></span></i><span
lang=EN-US style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US'><o:p></o:p></span></p>

<p class=MsoCaption><span lang=EN-US style='mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Figure </span><!--[if supportFields]><span lang=EN-US
style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'><span
style='mso-element:field-begin'></span><span
style='mso-spacerun:yes'> </span>SEQ Figure \* ARABIC <span style='mso-element:
field-separator'></span></span><![endif]--><span lang=EN-US style='mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>4</span><!--[if supportFields]><span
lang=EN-US style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US'><span style='mso-element:field-end'></span></span><![endif]--><span
lang=EN-US style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US'>: Three consensus sequences grouped by strains with equal symptom
severity.<o:p></o:p></span></p>

<p class=MsoNormal><span lang=EN-US style='mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<div class=MsoNormal align=center style='text-align:center;mso-pagination:none;
mso-layout-grid-align:none;text-autospace:none'><b style='mso-bidi-font-weight:
normal'><span lang=EN-US style='font-family:"Arial","sans-serif";mso-ansi-language:
EN-US'>

<hr size=2 width="100%" align=center>

</span></b></div>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span lang=EN-US style='font-size:16.0pt;mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>MC3.4:&nbsp; Due to the rapid spread
of the virus and limited resources, medical personnel would like to focus on
treatments and quarantine procedures for the worst of the mutant strains from
the current outbreak, not just symptoms as in the previous question. To find
the most dangerous viral mutants, experts are monitoring multiple disease
characteristics.</span></b><span lang=EN-US style='font-size:16.0pt;mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'><o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>Consider each virulence and drug
resistance characteristic as equally important. Identify the top 3 mutations
that lead to the most dangerous viral strains. The mutations involve one or
more base substitutions.&nbsp; In a worst case scenario, a very dangerous
strain could cause severe symptoms, have high mortality, cause major
complications, exhibit resistance to anti viral drugs, and target high risk
groups. For this question, the biological properties of the underlying amino
acid sequence patterns are not significant in determining disease
characteristics.</span></b><span lang=EN-US style='font-size:16.0pt;mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'><o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>For each mutation provide the base
substitutions and their position in the sequence (left to right) where the base
substitutions occurred. For example,</span></b><span lang=EN-US
style='font-size:16.0pt;mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US'><o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>C -&gt; G, 456 (C changed to G at
position 456)</span></b><span lang=EN-US style='font-size:16.0pt;mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'><o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>G -&gt; A, 513 and T -&gt; A, 907 (G
changed to A at position 513 and T changed to A at position 907)</span></b><span
lang=EN-US style='font-size:16.0pt;mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>A -&gt; G, 39 (A changed to G at
position 39).<o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span lang=EN-US style='font-size:16.0pt;mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Answer: <o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>T </span></b><b style='mso-bidi-font-weight:normal'><span
lang=EN-US style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>-&gt;</span></b><span lang=EN-US
style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'> </span><b
style='mso-bidi-font-weight:normal'><span lang=EN-US style='font-family:"Arial","sans-serif";
mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'>C, 842 and A </span></b><b
style='mso-bidi-font-weight:normal'><span lang=EN-US style='font-size:13.0pt;
font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>-&gt; </span></b><b style='mso-bidi-font-weight:normal'><span
lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>T, 946<span style='mso-spacerun:yes'>  </span><o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>G </span></b><b style='mso-bidi-font-weight:normal'><span
lang=EN-US style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>-&gt; </span></b><b
style='mso-bidi-font-weight:normal'><span lang=EN-US style='font-family:"Arial","sans-serif";
mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'>C, 161 and T </span></b><b
style='mso-bidi-font-weight:normal'><span lang=EN-US style='font-size:13.0pt;
font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>-&gt; </span></b><b style='mso-bidi-font-weight:normal'><span
lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>C, 790 <o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>G </span></b><b style='mso-bidi-font-weight:normal'><span
lang=EN-US style='font-size:13.0pt;font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'>-&gt; </span></b><b
style='mso-bidi-font-weight:normal'><span lang=EN-US style='font-family:"Arial","sans-serif";
mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'>C, 22 and C </span></b><b
style='mso-bidi-font-weight:normal'><span lang=EN-US style='font-size:13.0pt;
font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>-&gt; </span></b><b style='mso-bidi-font-weight:normal'><span
lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>A, 79 <o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span lang=EN-US style='font-size:16.0pt;mso-bidi-font-family:
"Times New Roman";mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Our general approach is to associate the genotype of a
strain with its disease characteristics, the phenotype, in a matrix based
alignment view. Symptom characteristics were mapped to integers and added as
meta information to the nucleotide alignment. An additional column summing the
symptoms for each patient was added as scoring function for overall virulance.
Columns can be moved, hidden and sorted. In the alignment viewer, each position
is colored either by nucleotide or attribute value. For attributes, a
single-hue (red) was used with opacity denoting the attribute value. If rows
are selected, a consensus sequence can be computed which is then shown instead
of the rows it represents. The nucleotide of the consensus sequence at position
i is chosen as the one with largest frequency: arg max<sub>c</sub> {f(c,i), c
in {A,G,C,T}}. Here, opacity is mapped to the relative frequency of the
nucleotide in the consensus, reflecting the degree of conservation of a
nucleotide in the consensus. Several consensus sequences can also be joined to
a new consensus sequence, allowing the user to interactively build a ‘consensus
tree’. Finally, for attribute values the average is taken as consensus instead
of the most frequent occurrence. This makes sense, as disease characteristics have
been mapped to linear scale previously. <o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>We first noted that many positions in the alignment
are perfectly conserved, i.e. all strains have an identical nucleotide at that
position. Since conserved positions cannot contribute to virulence of a mutant,
we (automatically) removed these positions from further considerations. We also
removed all columns for which just one strain differed from the other strains.
These singular mutations define the individual strain identity, but not mutant
virulence. <o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>We then compared the remaining 14 columns with the
virulance score (the sum over all attribute values). The entries of the score
range from 1 to 8. First, we sorted all rows according to the virulance score.
Next we hypothesized whether all 8 levels of phenotypes are represented by
different consensus sequences. The main idea is to find visual correlations of
the opacity of an alignment column with the opacity of the phenotype
attributes. Again we searched for the visually most prominent correlation of
alignment and attribute columns. However, for the remaining 14 columns we see
that such a fine resolution into 8 phenotypes is not reflected by the consensus
sequences (Figure 5).<o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></i></p>

<table class=TableNormal border=1 cellspacing=0 cellpadding=0 style='border-collapse:
 collapse;border:none;mso-border-alt:solid windowtext .5pt;mso-yfti-tbllook:
 1184;mso-padding-alt:0cm 5.4pt 0cm 5.4pt'>
 <tr style='mso-yfti-irow:0;mso-yfti-firstrow:yes;mso-yfti-lastrow:yes'>
  <td width=567 valign=top style='width:425.2pt;border:solid windowtext 1.0pt;
  mso-border-alt:solid windowtext .5pt;padding:0cm 5.4pt 0cm 5.4pt'>
  <p class=MsoNormal style='mso-pagination:none;page-break-after:avoid;
  mso-layout-grid-align:none;text-autospace:none'><span style='mso-bidi-font-family:
  "Times New Roman";mso-no-proof:yes'><!--[if gte vml 1]><v:shape id="Picture_x0020_10"
   o:spid="_x0000_i1033" type="#_x0000_t75" alt="mc3" style='width:414.75pt;
   height:221.25pt;visibility:visible;mso-wrap-style:square'>
   <v:imagedata src="index_files/image010.png" o:title="mc3"/>
  </v:shape><![endif]--><![if !vml]><img border=0 width=553 height=295
  src="index_files/image011.png" alt=mc3 v:shapes="Picture_x0020_10"><![endif]></span><span
  style='mso-bidi-font-family:"Times New Roman"'><o:p></o:p></span></p>
  <p class=MsoCaption><span lang=EN-US style='mso-bidi-font-family:"Times New Roman";
  mso-ansi-language:EN-US'>Figure </span><!--[if supportFields]><span
  style='mso-bidi-font-family:"Times New Roman"'><span style='mso-element:field-begin'></span></span><span
  lang=EN-US style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:
  EN-US'><span style='mso-spacerun:yes'> </span>SEQ Figure \* ARABIC </span><span
  style='mso-bidi-font-family:"Times New Roman"'><span style='mso-element:field-separator'></span></span><![endif]--><span
  lang=EN-US style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:
  EN-US'>5</span><!--[if supportFields]><span style='mso-bidi-font-family:"Times New Roman"'><span
  style='mso-element:field-end'></span></span><![endif]--><span lang=EN-US
  style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'>: 8
  consensus sequences of all sequences with virulance score levels 1, 2, ...,
  8, respectively.</span><i style='mso-bidi-font-style:normal'><span
  lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
  mso-ansi-language:EN-US'><o:p></o:p></span></i></p>
  </td>
  <td width=653 valign=top style='width:489.8pt;border:solid windowtext 1.0pt;
  border-left:none;mso-border-left-alt:solid windowtext .5pt;mso-border-alt:
  solid windowtext .5pt;padding:0cm 5.4pt 0cm 5.4pt'>
  <p class=MsoNormal style='mso-pagination:none;page-break-after:avoid;
  mso-layout-grid-align:none;text-autospace:none'><span style='mso-bidi-font-family:
  "Times New Roman";mso-no-proof:yes'><!--[if gte vml 1]><v:shape id="Picture_x0020_11"
   o:spid="_x0000_i1032" type="#_x0000_t75" alt="mc3" style='width:414.75pt;
   height:149.25pt;visibility:visible;mso-wrap-style:square'>
   <v:imagedata src="index_files/image012.png" o:title="mc3"/>
  </v:shape><![endif]--><![if !vml]><img border=0 width=553 height=199
  src="index_files/image013.png" alt=mc3 v:shapes="Picture_x0020_11"><![endif]></span><span
  style='mso-bidi-font-family:"Times New Roman"'><o:p></o:p></span></p>
  <p class=MsoCaption><span lang=EN-US style='mso-bidi-font-family:"Times New Roman";
  mso-ansi-language:EN-US'>Figure </span><!--[if supportFields]><span
  style='mso-bidi-font-family:"Times New Roman"'><span style='mso-element:field-begin'></span></span><span
  lang=EN-US style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:
  EN-US'><span style='mso-spacerun:yes'> </span>SEQ Figure \* ARABIC </span><span
  style='mso-bidi-font-family:"Times New Roman"'><span style='mso-element:field-separator'></span></span><![endif]--><span
  lang=EN-US style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:
  EN-US'>6</span><!--[if supportFields]><span style='mso-bidi-font-family:"Times New Roman"'><span
  style='mso-element:field-end'></span></span><![endif]--><span lang=EN-US
  style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'>: 4
  consensus sequences corresponding to 4 levels of overall virulence. For
  clarity only the colors and corresponding opacity is shown. The tooltip of a cell
  show the underlying distribution of nucleotides.</span><i style='mso-bidi-font-style:
  normal'><span lang=EN-US style='font-family:"Arial","sans-serif";mso-bidi-font-family:
  "Times New Roman";mso-ansi-language:EN-US'><o:p></o:p></span></i></p>
  </td>
 </tr>
</table>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Since our tool efficiently allows the visual
comparison of consensus sequences that can be quickly computed from selected
rows, we gradually reduced the resolution of the overall phenotype groups from 8
to 4. The 4 phenotypes would correspond to very low (scores 1 and 2, low (scores
3,4), medium (scores 5,6) and high (scores 7,8) (Figure 6). We see four overall
patterns of alignment columns: <o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>1: decreasing opacity, indicating increasing mutation
rate with increased virulence <o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>2: increasing opacity, indicating decreasing mutation
rate with increased virulence <o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>3: one color but not with steadily increasing or
decreasing opacity, and <o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>4: columns with more than one color, indicating that
the majority of strains in that group have a different nucleotide at that
position than all other strains. <o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Positions 842, 161 and 790 belong to pattern 1,
positions 22, 79 and 946 are from pattern number 4.<o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>However, we also noted an uncertainty to decide. Other
positions could also be chosen as candidates. One observation that we made is
that individual disease characteristics lead to different contributions from
individual positions. We successively repeated our analyses with each of the 6
attribute columns, and found that positions 161 and 790 mainly lead to worse
'complications', positions 22,79 (and possibly 1033) and 842,946 nicely correlate
with 'drug resistance' (Figure 7). As ‘complications’ seem to become more
severe with ‘increasing drug resistance’, these positions obviously cause
increasing overall virulance.<o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-no-proof:yes'><!--[if gte vml 1]><v:shape id="Bild_x0020_15" o:spid="_x0000_i1031"
 type="#_x0000_t75" style='width:168.75pt;height:498pt;visibility:visible;
 mso-wrap-style:square'>
 <v:imagedata src="index_files/image016.png" o:title="mc3.4"/>
</v:shape><![endif]--><![if !vml]><img border=0 width=225 height=664
src="index_files/image016.png" v:shapes="Bild_x0020_15"><![endif]></span></i><i
style='mso-bidi-font-style:normal'><span lang=EN-US style='font-family:"Arial","sans-serif";
mso-bidi-font-family:"Times New Roman";mso-ansi-language:EN-US'><o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b><span lang=EN-US style='mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Figure 7: The reduced alignment with attributes but
without labels, sorted by ‘complications’ and ‘drug resistance’.<o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Using color without labels, as in Figure 7, helps the
researcher to identify patterns among columns. E.g., sorting rows according to ‘drug
resistance’, we immediately see that it is correlated with position 790: all
strains with major complications have a ‘C’ (blue color), while the other
strains except for two strains with minor complications have a ‘T’ (purple
color) at that position. We also nicely see the correlated mutation patterns of
positions 22, 79 and possibly 1033 as well as positions 842 and 946.<o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Using the statistics package R, we also determined which
positions are correlated. Therefore we computed the pairwise mutual information
and visualized the results in a heatmap (Figure 8). The heatmap quickly allows
the identification of cells with large mutual information values, which correspond
to pairs of highly correlated columns.<o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;page-break-after:avoid;
mso-layout-grid-align:none;text-autospace:none'><i style='mso-bidi-font-style:
normal'><span style='font-family:"Arial","sans-serif";mso-bidi-font-family:
"Times New Roman";mso-no-proof:yes'><!--[if gte vml 1]><v:shape id="Picture_x0020_12"
 o:spid="_x0000_i1030" type="#_x0000_t75" alt="CurrentOutbreakSeq_MI_sub-sub"
 style='width:300pt;height:365.25pt;visibility:visible;mso-wrap-style:square'>
 <v:imagedata src="index_files/image014.png" o:title="CurrentOutbreakSeq_MI_sub-sub"/>
</v:shape><![endif]--><![if !vml]><img border=0 width=400 height=487
src="index_files/image014.png" alt="CurrentOutbreakSeq_MI_sub-sub" v:shapes="Picture_x0020_12"><![endif]></span></i><span
lang=EN-US style='mso-bidi-font-family:"Times New Roman";mso-ansi-language:
EN-US'><o:p></o:p></span></p>

<p class=MsoCaption><span lang=EN-US style='mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Figure 8: Heatmap of pairwise mutual information of
selected columns in alignment.<o:p></o:p></span></p>

<p class=Normal><span lang=EN-US style='mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>We see several possible pairs of correlated mutations.
Position 161, 790, 842 and 946 are highly correlated. Furthermore positions 22
and 79 show a significant correlation, as well as with position number 161.
Altogether our top mutations for overall virulence are columns 842, 946 and
columns 22,79 and columns 790,161. <o:p></o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></i></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><i style='mso-bidi-font-style:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'>Efforts: one team member applied the tools offered by
the WEKA library to identify the best features to do a classification of the
strains with respect to their symptoms (1 day). Another team member implemented
a mutual information analysis in R in order to identify pairwise correlated
columns in the alignment (1 day). One team member implemented the alignment
viewer using the Qt toolkit in about one week. The tree visualizer was already
implemented in Java and needed only to be extended for communication with the
alignment viewer (1 day).<o:p></o:p></span></i></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></b></p>

<div class=MsoNormal align=center style='text-align:center;mso-pagination:none;
mso-layout-grid-align:none;text-autospace:none'><b style='mso-bidi-font-weight:
normal'><span lang=EN-US style='font-family:"Arial","sans-serif";mso-ansi-language:
EN-US'>

<hr size=2 width="100%" align=center>

</span></b></div>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'><span lang=EN-US
style='font-family:"Arial","sans-serif";mso-bidi-font-family:"Times New Roman";
mso-ansi-language:EN-US'><o:p>&nbsp;</o:p></span></b></p>

</div>

</body>

</html>